bitkeeper revision 1.1159.43.1 (4124b289EjJu2ABgQn-Zz7HxnmkRUQ)

author iap10@labyrinth.cl.cam.ac.uk <iap10@labyrinth.cl.cam.ac.uk>

Thu, 19 Aug 2004 14:00:41 +0000 (14:00 +0000)

committer iap10@labyrinth.cl.cam.ac.uk <iap10@labyrinth.cl.cam.ac.uk>

Thu, 19 Aug 2004 14:00:41 +0000 (14:00 +0000)
author iap10@labyrinth.cl.cam.ac.uk <iap10@labyrinth.cl.cam.ac.uk>
Thu, 19 Aug 2004 14:00:41 +0000 (14:00 +0000)
committer iap10@labyrinth.cl.cam.ac.uk <iap10@labyrinth.cl.cam.ac.uk>
Thu, 19 Aug 2004 14:00:41 +0000 (14:00 +0000)
diff --git a/tools/libxc/xc_linux_save.c b/tools/libxc/xc_linux_save.c

index 5a47b30f5633bca8aac883585385d6d32677359d..6e4bb55b1290c99305b376d0fb181b460b700072 100644 (file)
--- a/tools/libxc/xc_linux_save.c
+++ b/tools/libxc/xc_linux_save.c
@@ -295,7 +295,7 @@ int xc_linux_save(int xc_handle, XcIOContext *ioctxt)
      int rc = 1, i, j, k, last_iter, iter = 0;
      unsigned long mfn;
      u32 domid = ioctxt->domain;
-    int live = 0; // (ioctxt->flags & XCFLAGS_LIVE);
+    int live =  (ioctxt->flags & XCFLAGS_LIVE);
      int debug = (ioctxt->flags & XCFLAGS_DEBUG);
      int sent_last_iter, skip_this_iter;
  
@@ -440,7 +440,8 @@ int xc_linux_save(int xc_handle, XcIOContext *ioctxt)
  
      /* Domain is still running at this point */
  
-    if( live ){ 
+    if( live ){
+printf("GO LIVE!!\n");
          if ( xc_shadow_control( xc_handle, domid, 
                                  DOM0_SHADOW_CONTROL_OP_ENABLE_LOGDIRTY,
                                  NULL, 0, NULL ) < 0 ) {
diff --git a/xen/arch/x86/shadow.c b/xen/arch/x86/shadow.c

index 362b0f4560aafb4e3e9f77ecd419c8aecf53fd90..06445943ab24c7ce1d893ecc62b0c6c994b96224 100644 (file)
--- a/xen/arch/x86/shadow.c
+++ b/xen/arch/x86/shadow.c
@@ -29,41 +29,6 @@ hypercall lock anyhow (at least initially).
  ********/
  
  
-/**
-
-FIXME:
-
-The shadow table flush command is dangerous on SMP systems as the
-guest may be using the L2 on one CPU while the other is trying to 
-blow the table away. 
-
-The current save restore code works around this by not calling FLUSH,
-but by calling CLEAN2 which leaves all L2s in tact (this is probably
-quicker anyhow).
-
-Even so, we have to be very careful. The flush code may need to cause
-a TLB flush on another CPU. It needs to do this while holding the
-shadow table lock. The trouble is, the guest may be in the shadow page
-fault handler spinning waiting to grab the shadow lock. It may have
-intterupts disabled, hence we can't use the normal flush_tlb_cpu
-mechanism.
-
-For the moment, we have a grim race whereby the spinlock in the shadow
-fault handler is actually a try lock, in a loop with a helper for the
-tlb flush code.
-
-A better soloution would be to take a new flush lock, then raise a
-per-domain soft irq on the other CPU.  The softirq will switch to
-init's PTs, then do an atomic inc of a variable to count himself in,
-then spin on a lock.  Having noticed that the other guy has counted
-in, flush the shadow table, then release him by dropping the lock. He
-will then reload cr3 from mm.page_table on the way out of the softirq.
-
-In domian-softirq context we know that the guy holds no locks and has
-interrupts enabled. Nothing can go wrong ;-)
-
-**/
-
  static inline void free_shadow_page(struct mm_struct *m, 
                                      struct pfn_info *page)
  {
@@ -381,9 +346,9 @@ static int shadow_mode_table_op(struct domain *d,
                 d->mm.shadow_dirty_net_count   = 0;
                 d->mm.shadow_dirty_block_count = 0;
         
-               sc->pages = d->tot_pages;
+               sc->pages = d->max_pages;
  
-               if( d->tot_pages > sc->pages || 
+               if( d->max_pages > sc->pages || 
                         !sc->dirty_bitmap || !d->mm.shadow_dirty_bitmap )
                 {
                         rc = -EINVAL;
@@ -393,10 +358,10 @@ static int shadow_mode_table_op(struct domain *d,
         
  #define chunk (8*1024) // do this in 1KB chunks for L1 cache
         
-               for(i=0;i<d->tot_pages;i+=chunk)
+               for(i=0;i<d->max_pages;i+=chunk)
                 {
-                       int bytes = ((  ((d->tot_pages-i) > (chunk))?
-                                                       (chunk):(d->tot_pages-i) ) + 7) / 8;
+                       int bytes = ((  ((d->max_pages-i) > (chunk))?
+                                                       (chunk):(d->max_pages-i) ) + 7) / 8;
             
                         copy_to_user( sc->dirty_bitmap + (i/(8*sizeof(unsigned long))),
                                                   d->mm.shadow_dirty_bitmap +(i/(8*sizeof(unsigned long))),
@@ -428,21 +393,21 @@ static int shadow_mode_table_op(struct domain *d,
                 sc->stats.dirty_net_count   = d->mm.shadow_dirty_net_count;
                 sc->stats.dirty_block_count = d->mm.shadow_dirty_block_count;
         
-               if( d->tot_pages > sc->pages || 
+               if( d->max_pages > sc->pages || 
                         !sc->dirty_bitmap || !d->mm.shadow_dirty_bitmap )
                 {
                         rc = -EINVAL;
                         goto out;
                 }
         
-               sc->pages = d->tot_pages;
+               sc->pages = d->max_pages;
         
  #define chunk (8*1024) // do this in 1KB chunks for L1 cache
         
-               for(i=0;i<d->tot_pages;i+=chunk)
+               for(i=0;i<d->max_pages;i+=chunk)
                 {
-                       int bytes = ((  ((d->tot_pages-i) > (chunk))?
-                                                       (chunk):(d->tot_pages-i) ) + 7) / 8;
+                       int bytes = ((  ((d->max_pages-i) > (chunk))?
+                                                       (chunk):(d->max_pages-i) ) + 7) / 8;
             
                         copy_to_user( sc->dirty_bitmap + (i/(8*sizeof(unsigned long))),
                                                   d->mm.shadow_dirty_bitmap +(i/(8*sizeof(unsigned long))),
@@ -475,7 +440,13 @@ int shadow_mode_control(struct domain *d, dom0_shadow_control_t *sc)
      unsigned int cmd = sc->op;
      int rc = 0;
  
-    spin_lock(&d->mm.shadow_lock);
+       if (d == current)
+               printk("Attempt to control your _own_ shadow tables. I hope you know what you're doing!\n");
+
+       domain_pause(d);
+       synchronise_pagetables(d->processor);
+
+       spin_lock(&d->mm.shadow_lock);
  
      if ( cmd == DOM0_SHADOW_CONTROL_OP_OFF )
      {
@@ -502,10 +473,10 @@ int shadow_mode_control(struct domain *d, dom0_shadow_control_t *sc)
          rc = -EINVAL;
      }
  
-       flush_tlb_cpu(d->processor);
-   
      spin_unlock(&d->mm.shadow_lock);
  
+       domain_unpause(d);
+
      return rc;
  }
  
@@ -518,6 +489,7 @@ static inline struct pfn_info *alloc_shadow_page(struct mm_struct *m)
  void unshadow_table( unsigned long gpfn, unsigned int type )
  {
      unsigned long spfn;
+       struct domain *d = frame_table[gpfn].u.inuse.domain;
  
      SH_VLOG("unshadow_table type=%08x gpfn=%08lx",
              type,
@@ -530,11 +502,11 @@ void unshadow_table( unsigned long gpfn, unsigned int type )
      // even in the SMP guest case, there won't be a race here as
      // this CPU was the one that cmpxchg'ed the page to invalid
  
-    spfn = __shadow_status(&current->mm, gpfn) & PSH_pfn_mask;
+    spfn = __shadow_status(&d->mm, gpfn) & PSH_pfn_mask;
  
-    delete_shadow_status(&current->mm, gpfn);
+    delete_shadow_status(&d->mm, gpfn);
  
-    free_shadow_page( &current->mm, &frame_table[spfn] );
+    free_shadow_page(&d->mm, &frame_table[spfn] );
  
  }
  
@@ -651,15 +623,7 @@ int shadow_fault( unsigned long va, long error_code )
  
      // take the lock and reread gpte
  
-    while( unlikely(!spin_trylock(&current->mm.shadow_lock)) )
-       {
-               extern volatile unsigned long flush_cpumask;
-               if ( test_and_clear_bit(smp_processor_id(), &flush_cpumask) )
-                       local_flush_tlb();
-               rep_nop();
-       }
-       
-       ASSERT(spin_is_locked(&current->mm.shadow_lock));
+       spin_lock(&current->mm.shadow_lock);
         
      if ( unlikely(__get_user(gpte, (unsigned long*)&linear_pg_table[va>>PAGE_SHIFT])) )
      {
author	iap10@labyrinth.cl.cam.ac.uk <iap10@labyrinth.cl.cam.ac.uk>
	Thu, 19 Aug 2004 14:00:41 +0000 (14:00 +0000)
committer	iap10@labyrinth.cl.cam.ac.uk <iap10@labyrinth.cl.cam.ac.uk>
	Thu, 19 Aug 2004 14:00:41 +0000 (14:00 +0000)
tools/libxc/xc_linux_save.c		patch \| blob \| history
xen/arch/x86/shadow.c		patch \| blob \| history